SEQUENCE LISTING 



<110> ADLER, JON ELLIOT 
ZOZULYA, SERGEY 
LI , XIADONG 
O'CONNELL, SHAWN 
STAS2EWSKI , LENA 

<120> T1R TASTE RECEPTORS AND GENES ENCODING SAME 

<130> 0780'03/0277870/RXT 

<140> 09/799,629 
<141> 2001-03-07 

<150> 60/187,546 
<151> 2000-03-07 

<150> 60/195,536 
<151> 2000-04-07 

<150> 60/209,840 
<151> 2000-06-06 

<150> 60/214,213 
<151> 2000-06-23 

<150> 30/226,448 
<151> 2000-08-17 

<150> 60/259,227 
<151> 2001-01-03 

<160> 20 

<170> Patentln Ver. 2.1 

<210> 1 
<211> 876 
<212> DNA 

<213> Homo sapiens 
<400> 1 

agcctggcag tggcctcagg 
ggacaccact ggggccccag 
tcctctgccc gctccccgcc 
ctgccgtgcc tgttggaagt 
ctctgggctc tcctgcaccc 
atgaaggggg actacgtgct 
ctccgcagcc ggacacggcc 
tgggtcgggg tcagggtgac 
ctgcggttct gtgtggcccc 
aaatggccgt ggaggagatc 
acgacctctt tgatacgtgc 
tggccaaggc aggcagccgc 
gtgtgctggc tgtcatcggg 
tcagcttctt cctcatgccc 
cctgccccgt gggagcccct 



cagagtctga cgcgcacaaa ctttcaggcc caggaagcga 60 
ggtgtggcaa gtgaggatgg caagggtttt gctaaacaaa 120 
ccgggctcac tccatgtgag gccccagtcg gggcagccac 180 
tgcctctgcc atgctgggcc ctgctgtcct gggcctcagc 240 
tgggacgggg gccccattgt gcctgtcaca gcaacttagg 300 
gggggggctg ttccccctgg gcgaggccga ggaggctggc 360 
cagcagccct gtgtgcacca ggtacagagg tgggacggcc 42 0 
caggtctggg gtgctcctga gctggggccg aggtggccat 480 
aggttctcct caaacggcct gctctgggca ctggccatga 540 
aacaacaagt cggatctgct gcccgggctg cgcctgggct 600 
tcggagcctg tggtggccat gaagcccagc ctcatgttcc 660 
gacatcgccg cctactgcaa ctacacgcag taccagcccc 720 
ccccactcgt cagagctcgc catggtcacc ggcaagttct 780 
cagtggggcg ccccccacca tcacccaccc. ccaaccaacc 840 
tgtgtcagga gaatgc 876 



o 



<210> 2 

<211> 2687 

<212> DNA 

<213> Homo sapiens 



<400> 2 

tacatgcacc 

gcaggtcagc 

cttccgcacc 

gttcggctgg 

gagcatcttc 

gccgctgccc 

gaaccagagc 

cttcaactac 

gctgacctct 

cttcctccag 

cctggccacc 

ggacgtggtg 

agggctaaat 

cctgcacaac 

ctggcaggtg 

gcacggccac 

gctcctggag 

cagcagcgga 

gcccaggctc 

ccgctggcac 

gtagcccccg 

gcccagccga 

cggcagtgcc 

tgtgtggact 

gcgggggtgg 

cacagggtac 

accttttgtg 

tctcggttcc 

gcgctgggcc 

gttcaggcct 

ctcagcgtcc 

ttgtcccacc 

ttcgtggagt 

ccctgggcct 

tacctggtgg 

ctggtgcact 

acgctggcct 

aaccgtgccc 

gtgcccctcc 

ctgctctgtg 

cggcagccag 

ggccagaatg 

tcagccccgg 

tcgctacaga 

cacagtgagc 



ccacccagcc 
tacggtgcta 
gtgcccagcg 
aactgggtgg 
tcggccctgg 
cgtgccgatg 
agcgtgcagg 
agcatcagca 
gacctggtca 
aggggtgccc 
gacccggcct 
ggccagcgct 
caccaccaga 
actcttcagt 
agcccgggag 
cacgcctgag 
aacatgtaca 
aacgtggaca 
cacgacgtgg 
acgtctgaca 
cggcagggcg 
gcagagccag 
aggagggcca 
gcgaggcggg 
gaacgcagca 
aagacgaaca 
gccaggatga 
tggcatgggg 
ttgtgctggc 
cgggggggcc 
tcctgttccc 
tcccgctcac 
cagaactgcc 
ggctggtggt 
ccttcccgcc 
gccgcacacg 
ttctctgctt 
gtggcctcac 
tggccaatgt 
tcctgggcat 
ggctcaacac 
acgggaacac 
tgaacccaga 
gaccctcccg 
cctaggcctg 



ctgccctggg 
gcatggagct 
accgtgtgca 
ccgccctggg 
ccgcggcacg 
actcgcggct 
tggtgctgct 
gcaggctctc 
tggggctgcc 
agctgcacga 
tctgctctgc 
gcccgcagtg 
cgttctctgt 
gcaacgcctc 
atgggggtgt 
ctggaggtgg 
acctgacctt 
tggagtacga 
gcaggttcaa 
accaggtgag 
cagcctgggg 
accccaggcc 
ggtgcgccgg 
cagctaccgg 
ggggagggtc 
cccagcgccc 
gtggtccccg 
cgagccggct 
tgctttgggg 
cctggcctgc 
tggccagccc 
gggctgcctg 
tctgagctgg 
gctgctggcc 
ggaggtggtg 
ctcctgggtc 
cctgggcact 
ctttgccatg 
gcaggtggtc 
cctggctgcc 
ccccgagttc 
aggaaatcag 
cttagctgcg 
ctctaggttc 
gagcacgtgg 



agccctgtgt 
gctgagcgcc 
gctgacggcc 
cagcgacgac 
cggcatctgc 
ggggaaggtg 
gttcgcctcc 
gcccaaggtg 
cggcatggcc 
gttcccccag 
cctgggcgag 
tgactgcatc 
ctacgcagct 
aggctgcccc 
gctgtcctct 
ctggcggctc 
ccacgtgggc 
cctgaagctg 
cggcagcctc 
gtgagggtgg 
gtgggggccg 
tgtgcgcaga 
gtcaaggggt 
caaaacccag 
ctgccaagtc 
ttctcctctc 
gagcgaagca 
gtgctgctgc 
ctgttcgttc 
tttggcctgg 
agccctgccc 
agcacactct 
gcagaccggc 
atgctggtgg 
acggactggc 
agcttcggcc 
ttcctggtgc 
ctggcctact 
ctcaggcccg 
ttccacctgc 
ttcctgggag 
gggaaacatg 
atccccccca 
tgaccccagg 
acacccctgt 



cagaagatgc 
cgggagacct 
gccgcggagc 
gagtacggcc 
atcgcgcacg 
caggacgtcc 
gtgcacgccg 
tgggtggcca 
cagatgggca 
tacgtgaaga 
agggagcagg 
acgctgcaga 
gtgtatagcg 
gcgcaggacc 
gcatgtgccc 
agccccgtcc 
gggctgccgc 
tgggtgtggc 
aggacagagc 
gtgtgccagg 
ttccagtctc 
agcccgtgtc 
tccactcctg 
gtgagccgcc 
ctgactctga 
tcacagacga 
cacgctgctt 
tgctcctgct 
accatcggga 
tgtgcctggg 
gatgcctggc 
tcctgcaggc 
tgagtggctg 
aggtcgcact 
acatgctgcc 
tagcgcacgc 
ggagccagcc 
tcatcacctg 
ccgtgcagat 
ccaggtgtta 
ggggccctgg 
agtgacccaa 
agccagcaat 
ttgtctcctg 
gaccatc 



tcttggcctt 

tcccctcctt 

tgctgcagga 

ggcagggcct 

agggcctggt, 

tgcaccaggt 

cccacgccct 

gcgaggcctg 

cggtgcttgg 

cgcacctggc 

gtctggagga 

acgtgagcgc 

tggcccaggc 

ccgtgaagcc 

aggccaccag 

cccgcccgca 

tgcggttcga 

agggctcagt 

gcctgaagat 

cgtgcccgtg 

ccgtgggcat 

ccggtgctcg 

ctgctacgac 

ttcccggcag 

gaccagagcc 

catcgcctgc 

ccgccgcagg 

gctgagcctg 

cagcccactg 

cctggtctgc 

ccagcagccc 

ggccgagatc 

cctgcggggg 

gtgcacctgg 

cacggaggcg 

caccaatgcc 

gggctgctac 

ggtctccttt 

gggcgccctc 

cctgctcatg 

ggatgcccaa 

ccctgtgatc 

gacccgtgtc 

accctgaccc 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2580 

264 0 

2687 



<210> 3 
<211> 2553 



o 



<212> DNA 

<213> Homo sapiens 



<400> 3 

atgctgggcc 

gccccattgt 

ttccccctgg 

gtgtgcacca 

gaggagatca 

gatacgtgct 

ggcagccgcg 

gtcatcgggc 

ctcatgcccc 

ttcttccgca 

gagttcggct 

ctgagcatct 

gtgccgctgc 

gtgaaccaga 

ctcttcaact 

tggctgacct 

ggcttcctcc 

gccctggcca 

gaggacgtgg 

gcagggctaa 

gccctgcaca 

ccctggcagc 

cggttcgaca 

ggctcagtgc 

ctgaagatcc 

tgccaggagg 

gactgcgagg 

caggatgagt 

gcatgggigcg 

gtgctggctg 

ggggggcccc 

ctgttccctg 

ccgctcacgg 

gaactgcctc 

ctggtggtgc 

ttcccgccgg 

cgcacacgct 

ctctgcttcc 

ggcctcacct 

gccaatgtgc 

ctgggcatcc 

ctcaacaccc 

gggaacacag 



ctgctgtcct 
gcctgtcaca 
gcgaggccga 
ggttctcctc 
acaacaagtc 
cggagcctgt 
acatcgccgc 
cccactcgtc 
actacggtgc 
ccgtgcccag 
ggaactgggt 
tctcggccct 
cccgtgccga 
gcagcgtgca 
acagcatcag 
ctgacctggt 
agaggggtgc 
ccgacccggc 
tgggccagcg 
atcaccacca 
acactcttca 
tcctggagaa 
gcagcggaaa 
ccaggctcca 
gctggcacac 
gccaggtgcg 
cgggcagcta 
ggtccccgga 
agccggctgt 
ctttggggct 
tggcctgctt 
gccagcccag 
gctgcctgag 
tgagctgggc 
tgctggccat 
aggtggtgac 
cctgggtcag 
tgggcacttt 
ttgccatgct 
aggtggtcct 
tggctgcctt 
ccgagttctt 
gaaatcaggg 



gggcctcagc 
gcaacttagg 
ggaggctggc 
aaacggcctg 
ggatctgctg 
ggtggccatg 
ctactgcaac 
agagctcgcc 
tagcatggag 
cgaccgtgtg 
ggccgccctg 
ggccgcggca 
tgactcgcgg 
ggtggtgctg 
cagcaggctc 
catggggctg 
ccagctgcac 
cttctgctct 
ctgcccgcag 
gacgttctct 
gtgcaacgcc 
catgtacaac 
cgtggacatg 
cgacgtgggc 
gtctgacaac 
ccgggtcaag 
ccggcaaaac 
gcgaagcaca 
gctgctgctg 
gttcgttcac 
tggcctggtg 
ccctgcccga 
cacactcttc 
agaccggctg 
gctggtggag 
ggactggcac 
cttcggccta 
cctggtgcgg 
ggcctacttc 
caggcccgcc 
ccacctgccc 
cctgggaggg 
gaaacatgag 



ctctgggctc 
atgaaggggg 
ctccgcagcc 
ctctgggcac 
cccgggctgc 
aagcccagcc 
tacacgcagt 
atggtcaccg 
ctgctgagcg 
cagctgacgg 
ggcagcgacg 
cgcggcatct 
ctggggaagg 
ctgttcgcct 
tcgcccaagg 
cccggcatgg 
gagttccccc 
gccctgggcg 
tgtgactgca 
gtctacgcag 
tcaggctgcc 
ctgaccttcc 
gagtacgacc 
aggttcaacg 
cagaagcccg 
gggttccact 
ccagacgaca 
cgctgcttcc 
ctcctgctgc 
catcgggaca 
tgcctgggcc 
tgcctggccc 
ctgcaggcgg 
agtggctgcc 
gtcgcactgt 
atgctgccca 
gcgcacgcca 
agccagccgg 
atcacctggg 
gtgcagatgg 
aggtgttacc 
ggccctgggg 
tga 



tcctgcaccc 
actacgtgct 
ggacacggcc 
tggccatgaa 
gcctgggcta 
tcatgttcct 
accagccccg 
gcaagttctt 
cccgggagac 
ccgccgcgga 
acgagtacgg 
gcatcgcgca 
tgcaggacgt 
ccgtgcacgc 
tgtgggtggc 
cccagatggg 
agtacgtgaa 
agagggagca 
tcacgctgca 
ctgtgtatag 
ccgcgcagga 
acgtgggcgg 
tgaagctgtg 
gcagcctcag 
tgtcccggtg 
cctgctgcta 
tcgcctgcac 
gccgcaggtc 
tgagcctggc 
gcccactggt 
tggtctgcct 
agcagccctt 
ccgagatctt 
tgcgggggcc 
gcacctggta 
cggaggcgct 
ccaatgccac 
gctgctacaa 
tctcctttgt 
gcgccctcct 
tgctcatgcg 
atgcccaagg 



tgggacgggg 

gggggggCtg 

cagcagccct 
aatggccgtg 
cgacctcttt 
ggccaaggca 
tgtgctggct 
cagcttcttc 
cttcccctcc 
gctgctgcag 
ccggcagggc 
cgagggcctg 
cctgcaccag 
cgcccacgcc 
cagcgaggcc 
cacggtgctt 
gacgcacctg 
gggtctggag 
gaacgtgagc 
cgtggcccag 
ccccgtgaag 
gctgccgctg 
ggtgtggcag 
gacagagcgc 
ctcgcggcag 
cgactgtgtg 
cttttgtggc 
tcggttcctg 
gctgggcctt 
tcaggcctcg 
cagcgtcctc 
gtcccacctc 
cgtggagtca 
ctgggcctgg 
cctggtggcc 
ggtgcactgc 
gctggccttt 
ccgtgcccgt 
gcccctcctg 
gctctgtgtc 
gcagccaggg 
ccagaatgac 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2553 



<210> 4 

<211> 850 

<212> PRT 

<213> Homo sapiens 

<400> 4 

Met Leu Gly Pro Ala Val Leu Gly Leu Ser Leu Trp Ala Leu Leu His 
1 5 10 15 




Pro Gly Thr Gly Ala Pro Leu Cys Leu Ser Gin Gin Leu Arg Met Lys 
20 25 30 

Gly Asp Tyr Val Leu Gly Gly Leu Phe Pro Leu Gly Glu Ala Glu Glu 
35 40 45 

Ala Gly Leu Arg Ser Arg Thr Arg Pro Ser Ser Pro Val Cys Thr Arg 
50 55 60 

Phe Ser Ser Asn Gly Leu Leu Trp Ala Leu Ala Met Lys Met Ala Val 
65 70 75 80 

Glu Glu He Asn Asn Lys Ser Asp Leu Leu Pro Gly Leu Arg Leu Gly 
85 90 95 

Tyr Asp Leu Phe Asp Thr Cys Ser Glu Pro Val Val Ala Met Lys Pro 
100 105 110 

Ser Leu Met Phe Leu Ala Lys Ala Gly Ser Arg Asp He Ala Ala Tyr 
115 120 125 

Cys Asn Tyr Thr Gin Tyr Gin Pro Arg Val Leu Ala Val lie Gly Pro 
130 * 135 140 

His Ser Ser Glu Leu Ala Met Val Thr Gly Lys Phe Phe Ser Phe Phe 
145 150 155 160 

Leu Met Pro His Tyr Gly Ala Ser Met Glu Leu Leu Ser Ala Arg Glu 
165 170 175 

Thr Phe Pro Ser Phe Phe Arg Thr Val Pro Ser Asp Arg Val Gin Leu 
180 185 190 

Thr Ala Ala Ala Glu Leu Leu Gin Glu Phe Gly Trp Asn Trp Val Ala 
195 200 205 

Ala Leu Gly Ser Asp Asp Glu Tyr Gly Arg Gin Gly Leu Ser He Phe 
210 215 220 

Ser Ala Leu Ala Ala Ala Arg Gly He Cys He Ala His Glu Gly Leu 
225 230 235 240 

Val Pro Leu Pro Arg Ala Asp Asp Ser Arg Leu Gly Lys Val Gin Asp 
245 250 255 

Val Leu His Gin Val Asn Gin Ser Ser Val Gin Val Val Leu Leu Phe 
260 265 270 

Ala Ser Val His Ala Ala His Ala Leu Phe Asn Tyr Ser He Ser Ser 
275 280 285 

Arg Leu Ser Pro Lys Val Trp Val Ala Ser Glu Ala Trp Leu Thr Ser 
290 295 300 



Asp Leu Val Met Gly Leu Pro Gly Met Ala Gin Met Gly Thr Val Leu 
305 310 315 320 



o o 



Gly Phe Leu Gin Arg Gly Ala Gin Leu. His Glu Phe Pro Gin Tyr Val 
325 330 335 

Lys Thr His Leu Ala Leu Ala Thr Asp Pro Ala Phe Cys Ser Ala Leu 
340 345 350 

Gly Glu Arg Glu Gin Gly Leu Glu Glu Asp Val Val Gly Gin Arg Cys 
355 360 365 

Pro Gin Cys Asp Cys lie Thr Leu Gin Asn Val Ser Ala Gly Leu Asn 
370 375 380 

His His Gin Thr Phe Ser Val Tyr Ala Ala Val Tyr Ser Val Ala Gin 
385 390 395 400 

Ala Leu His Asn Thr Leu Gin Cys Asn Ala Ser Gly Cys Pro Ala Gin 
405 410 415 

Asp Pro Val Lys Pro Trp Gin Leu Leu Glu Asn Met Tyr Asn Leu Thr 
420 425 430 

Phe His Val Gly Gly Leu Pro Leu Arg Phe Asp Ser Ser Gly Asn Val 
435 440 445 

Asp Met Glu Tyr Asp Leu Lys Leu Trp Val Trp Gin Gly Ser Val Pro 
450 455 460 

Arg Leu His Asp Val Gly Arg Phe Asn Gly Ser Leu Arg Thr Glu Arg 
465 470 475 480 

Leu Lys lie Arg Trp His Thr Ser Asp Asn Gin Lys Pro Val Ser Arg 
485 490 495 

Cys Ser Arg Gin Cys Gin Glu Gly Gin Val Arg Arg Val Lys Gly Phe 
500 505 510 

His Ser Cys Cys Tyr Asp Cys Val Asp Cys Glu Ala Gly Ser Tyr Arg 
515 520 525 

Gin Asn Pro Asp Asp lie Ala Cys Thr Phe Cys Gly Gin Asp Glu Trp 
530 535 540 

Ser Pro Glu Arg Ser Thr Arg Cys Phe Arg Arg Arg Ser Arg Phe Leu 
545 * 550 555 560 

Ala Trp Gly Glu Pro Ala Val Leu Leu Leu Leu Leu Leu Leu Ser Leu 
565 570 . 575 

Ala Leu Gly Leu Val Leu Ala Ala Leu Gly Leu Phe Val His His Arg 
580 585 590 

Asp Ser Pro Leu Val Gin Ala Ser Gly Gly Pro Leu Ala Cys Phe Gly 
595 600 605 



Leu Val Cys Leu Gly Leu Val Cys Leu Ser Val Leu Leu Phe Pro Gly 
610 615 620 



Gin Pro Ser Pro Ala Arg Cys Leu Ala Gin Gin Pro Leu Ser His Leu 
625 630 635 640 

Pro Leu Thr Gly Cys Leu Ser Thr Leu Phe Leu Gin Ala Ala Glu lie 
645 650 655 

Phe Val Glu Ser Glu Leu Pro Leu Ser Trp Ala Asp Arg Leu Ser Gly 
660 665 670 

Cys Leu Arg Gly Pro Trp Ala Trp Leu Val Val Leu Leu Ala Met Leu 
675 680 685 

Val Glu Val Ala Leu Cys Thr Trp Tyr Leu Val Ala Phe Pro Pro Glu 
690 695 700 

Val Val Thr Asp Trp His Met Leu Pro Thr Glu Ala Leu Val His Cys 
705 710 715 720 

Arg Thr Arg Ser Trp Val Ser Phe Gly Leu Ala His Ala Thr Asn Ala 
725 730 735 

Thr Leu Ala Phe Leu Cys Phe Leu Gly Thr Phe Leu Val Arg Ser Gin 
740 745 750 

Pro Gly Cys Tyr Asn Arg Ala Arg Gly Leu Thr Phe Ala Met Leu Ala 
755 760 765 

Tyr Phe lie Thr Trp Val Ser Phe Val Pro Leu Leu Ala Asn Val Gin 
770 775 780 

Val Val Leu Arg Pro Ala Val Gin Met Gly Ala Leu Leu Leu Cys Val 
785 790 795 800 

Leu Gly lie Leu Ala Ala Phe His Leu Pro Arg Cys Tyr Leu Leu Met 
805 810 815 

Arg Gin Pro Gly Leu Asn Thr Pro Glu Phe Phe Leu Gly Gly Gly Pro 
820 825 830 

Gly Asp Ala Gin Gly Gin Asn Asp Gly Asn Thr Gly Asn Gin Gly Lys 
835 840 845 

His Glu 
850 



<210> 5 
<211> 23 
<212> DNA 

<213> Artificial Sequence 
<220> 

<221> modif ied_base 
<222> (3) 

<223> a, c, t, g # other or unknown 
<220> 

<221> modified base 



o 



<222> (9) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (12) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (18) 

<223> a, c, t, g, other or unknown 
<220> 

<223> Description of Artificial Sequence: Primer 
<400> 5 

cgnttyytng cntggggnga rcc 



<210> 6 
<211> 23 
<212> DNA 

<213> Artificial Sequence 
<220> 

<221> modif ied_base 
<222> (3) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (6) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (18) 

<223> a # c, t, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (21) 

<223> a, c, t, g, other or unknown 
<220> 

<223> Description of Artificial Sequence: Primer 
<400> 6 

cgngcncgrt trtarcancc ngg 



<210> 7 

<211> 9 

<212> PRT 

<213> Homo sapiens 



o 



o 



8 

<400> 7 

Arg Phe Leu Ala Trp Gly Glu Pro Ala 
1 5 



<210> 8 

<211> 8 

<212> PRT 

<213> Homo sapiens 

<400> 8 

Pro Gly Cys Tyr Asn Arg Ala Arg 
1 5 



<210> 9 
<211> 552 
<212> DNA 
<213> Mus sp. 



<400> 9 

gtgctgtcac 

ctctctgtcc 

tttggcctga 

agctctgcca 

agcacactct 

gcaaactggc 

tttgtggagg 

tggtcagtgc 

ggcttggtgc 

gtacaagacc 



tcctcctgct 
accactggga 
tctgcctagg 
gctgccttgc 
tcctgcaagc 
tatgcagcta 
cagcactatg 
tgcccacaga 
acatcaccaa 
ag 



gctttgcctg 
cagccctctt 
cctcttctgc 
acaacaacca 
agctgagacc 
ccttcgggac 
tgcctggtat 
ggtactggag 
tgcaatggta 



gtgctgggtc 
gtccaggcct 
ctcagtgtcc 
atggctcacc 
tttgtggagt 
tctggcctgc 
ttgaccgctt 
cactgccacg 
gcttttctct 



tagcactggc 
caggcggctc 
ttctgttccc 
tccctctcac 
ctgagctgcc 
tagtggtact 
caccagaagt 
tgcgttcctg 
gctttctggg 



tgctctgggg 60 
acagttctgc 12 0 
aggacggcca 180 
aggctgcctg 240 
actgagctgg 3 00 
gttggccact 3 60 
ggtgacagac 420 
ggtcaacctg 480 
cactttcctg 540 
552 



<210> 10 

<211> 184 

<212> PRT 

<213> Mus sp. 

<400> 10 
Val Leu Ser Leu 
1 

Ala Ala Leu Gly 
20 

Ala Ser Gly Gly 
35 

Phe Cys Leu Ser 
50 

Cys Leu Ala Gin 
65 

Ser Thr Leu Phe 



Leu Leu Leu Leu 
5 

Leu Ser Val His 



Ser Gin Phe Cys 
40 

Val Leu Leu Phe 
55 

Gin Pro Met Ala 
70 

Leu Gin Ala Ala 
85 



Cys Leu Val Leu 
10 

His Trp Asp Ser 
25 

Phe Gly Leu lie 



Pro Gly Arg Pro 
60 

His Leu Pro Leu 
75 

Glu Thr Phe Val 
90 



Gly Leu Ala Leu 
15 

Pro Leu Val Gin 
30 

Cys Leu Gly Leu 
45 

Ser Ser Ala Ser 



Thr Gly Cys Leu 
80 

Glu Ser Glu Leu 
95 



n 



o 



Pro Leu Ser Trp 
100 

Leu Leu Val Val 
115 

Trp Tyr Leu Thr 
130 

Pro Thr Glu Val 
145 

Gly Leu Val His 



Gly Thr Phe Leu 
180 



Ala Asn Trp Leu 



Leu Leu Ala Thr 
120 

Ala Ser Pro Glu 
135 

Leu Glu His Cys 
150 

lie Thr Asn Ala 
165 

Val Gin Asp Gin 



9 

Cys Ser Tyr Leu 
105 

Phe Val Glu Ala 



Val Val Thr Asp 
140 

His Val Arg Ser 
155 

Met Val Ala Phe 
170 



Arg Asp Ser Gly 
110 

Ala Leu Cys Ala 
125 

Trp Ser Val Leu 



Trp Val Asn Leu 
160 

Leu Cys Phe Leu 
175 



<210> 11 
<211> 558 
<212> DNA 
<213> Rattus sp. 



<400> 11 

gtgctgtcac 

ctctttgtcc 

tttggcctga 

cgctctgcca 

agcacactct 

gcaaactggc 

actcttgtgg 

acagattggc 

aigcctgggct 

ttcctggtac 



ttctcctgct 
actactggga 
tctgcctagg 
gctgccttgc 
tcctgcaagc 
tctgcagcta 
aggctgcact 
aggtgctgcc 
tggtgcacat 
aaagccag 



gctttgcctg 
cagccctctt 
cctcttctgc 
ccaacaacca 
agccgagatc 
ccttcggggc 
atgtgcctgg 
cacggaggta 
caccaatgca 



gtgctgggcc 
gttcaggcct 
ctcagtgtcc 
atggctcacc 
tttgtggagt 
ccctgggctt 
tacttgatgg 
ctggaacact 

ggggtagctt 



tgacactggc 
caggtgggtc 
ttctgttccc 
tccctctcac 
ctgagctgcc 
ggctggtggt 
ctttccctcc 
gccgcatgcg 
tcctctgctt 



tgccctgggg 60 
actgttctgc 120 
aggacgacca 180 
aggctgcctg 240 
actgagttgg 3 00 
actgctggcc 3 60 
agaggtggtg 42 0 
ttcctgggtc 480 
tctgggcact 540 
558 



<210> 12 
<211> 186 
<212> PRT 
<213> Rattus sp. 

<400> 12 

Val Leu Ser Leu Leu Leu Leu Leu Cys Leu Val Leu Gly Leu Thr Leu 
1 5 10 15 

Ala Ala Leu Gly Leu Phe Val His Tyr Trp Asp Ser Pro Leu Val Gin 
20 25 30 

Ala Ser Gly Gly Ser Leu Phe Cys Phe Gly Leu lie Cys Leu Gly Leu 
35 40 45 



Phe Cys Leu Ser Val Leu Leu Phe Pro Gly Arg Pro Arg Ser Ala Ser 
50 55 60 



Cys Leu Ala Gin Gin Pro Met Ala His Leu Pro Leu Thr Gly Cys Leu 
65 70 75 80 



oo 



oo 



Ser Thr Leu Phe Leu 
85 

Pro Leu Ser Trp Ala 
100 

Ala Trp Leu Val Val 
115 

Ala Trp Tyr Leu Met 
130 

Val Leu Pro Thr Glu 
145 

Ser Leu Gly Leu Val 
165 

Phe Leu Gly Thr Phe 
180 



10 

Gin Ala Ala Glu He 
90 

Asn Trp Leu Cys Ser 
105 

Leu Leu Ala Thr Leu 
120 

Ala Phe Pro Pro Glu 
135 

Val Leu Glu His Cys 
150 

His He Thr Asn Ala 
170 

Leu Val Gin Ser Gin 
185 



Phe Val Glu Ser Glu Leu 
95 

Tyr Leu Arg Gly Pro Trp 
110 

Val Glu Ala Ala Leu Cys 
125 

Val Val Thr Asp Trp Gin 
140 

Arg Met Arg Ser Trp Val 
155 160 

Gly Val Ala Phe Leu Cys 
175 



<210> 13 
<211> 2577 
<212> DNA 
<213> Rattus 



sp . 



<400> 13 

atgccgggtt 

tcctctttgt 

tttcccctgg 

ctatgtacca 

gaggagatca 

gacacatgct 

ggaagtcaaa 

gtcattggtc 

ctcatgccac 

ccatccttct 

ttgcagaatt 

gaaggtctga 

ggcctggtgc 

cgccaagtga 

tactcccttt 

gagtcctggc 

gttcttgggt 

cgccttgccc 

gaggagcgcg 

tcatctgggc 

tatgcagctg 

cattgccaca 

agtttccgtg 

tatgacctga 

ttcaacggca 

gtctcccagt 

tcctgctgct 

ttcacctgta 

cctcgcaggc 

ctttgcctgg 



tggctatctt 
gtctgtcaca 
gcacaactga 
ggttctcgcc 
acaatggatc 
cagagccagt 
gcattgct.gc 
cccactcatc 
aggtcagcta 
tccgcacagt 
tcagctggaa 
gcatcttttc 
cacaacatga 
accaaagcaa 
ttagctacag 
tgacctctga 
ttctgcagcg 
tagctgctga 
tgatggggcc 
tgatgcagaa 
tgtacagtgt 
catcagagcc 
ctcgagactt 
agatgtgggt 
cccttcagct 
gctcccggca 
atgactgtgt 
ctccatgtgg 
ccaagtttct 
tgctgggcct 



gggcctcagt 
gcaattcaag 
ggaggccact 
ccttggtttg 
tgccttgctc 
ggtcaccatg 
ctactgcaac 
agagcttgcc 
tagtgccagc 
gcccagtgac 
ctgggtggct 
tggtctggcc 
cactagtggc 
agtacaggtg 
catccttcat 
cctggtcatg 
cggtgcccta 
cccaacattc 
acgctgttca 
cctatcagct 
ggctcaggcc 
tgttcaaccc 
gacactgcag 
gtggcagagc 
gcagcactcg 
gtgcaaagat 
ggactgcaag 
caaggatcag 
ggcttggggg 
gacactggct 



ctggctgctt 
gcacaagggg 
ctcaaccaga 
ttcctggcca 
cctgggctgc 
aagcccagcc 
tacacacagt 
ctcattacag 
atggatcggc 
cgggtgcagc 
gccttaggta 
aactcacgag 
caacaattgg 
gtggtgctgt 
gacctctcac 
acacttccca 
ctgcctgaat 
tgtgcctccc 
caatgtgact 
gggcagttgc 
cttcacaaca 
tggcagctcc 
tttgatgcca 
cctacacctg 
aaaatgtatt 
ggccaggtgc 
gcagggagct 
tggtccccag 
gagccagctg 
gccctggggc 



tcctggagct 
actatatatt 
gaacacagcc 
tggctatgaa 
gactgggcta 
tcatgttcat 
accaaccccg 
gcaagttctt 
taagtgaccg 
tgcaggccgt 
gtgatgatga 
gtatctgcat 
gcaaggtggt 
ttgcatctgc 
ccaaggtatg 
atattgcccg 
tttcccatta 
tgaaagctga 
acatcatgct 
accaccaaat 
ccctgcagtg 
tggagaacat 
aagggagtgt 
tactacatac 
ggccaggcaa 
gcagagtaaa 
accggaagca 
aaaaaagcac 
tgctgtcact 
tctttgtcca 



tgggatgggg 
gggtggacta 
caacggcatc 
gatggctgta 
tgacctgttt 
ggccaaggtg 
tgtgctggct 
cagcttcttc 
ggaaacattt 
tgtgacactg 
ctatggccgg 
tgcacacgag 
ggatgtgcta 
ccgtgctgtc 
ggtggccagt 
tgtgggcact 
tgtggagact 
gttggatctg 
acagaacctg 
atttgcaacc 
caatgtctca 
gtacaatatg 
agacatggaa 
tgtaggcacc 
ccaggtgcca 
gggctttcat 
tccagatgac 
aacctgctta 
tctcctgctg 
ctactgggac 



60 

120 

180 

240 

3 00 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 



on 



no 



11 



agccctcttg 
ctcttctgcc 
caacaaccaa 
gccgagatct 
cttcggggcc 
tgtgcctggt 
acggaggtac 
accaatgcag 
ggtcgctata 
gtctcttttg 
ggtgctatct 
gtacttctgt 
gaagcatcag 



ttcaggcctc 
tcagtgtcct 
tggctcacct 
ttgtggagtc 
cctgggcttg 
acttgatggc 
tggaacactg 
tgttagcttt 
accgtgcccg 
tgcccctcct 
tattctgtgc 
ggctgccaga 
atgggaatag 



aggtgggtca 
tctgttccca 
ccctctcaca 
tgagctgcca 
gctggtggta 
tttccctcca 
ccgcatgcgt 
cctctgcttt 
tggcctcacc 
ggctaatgtg 
cctgggcatc 
gctcaacacc 
tggtagtagt 



ctgttctgct 
ggacgaccac 
ggctgcctga 
ctgagttggg 
ctgctggcca 
gaggtggtga 
tcctgggtca 
ctgggcactt 
ttcgccatgc 
caggtggcct 
ctggccacct 
caggagttct 
gaggcaactc 



ttggcctgat 
gctctgccag 
gcacactctt 
caaactggct 
ctcttgtgga 
cagattggca 
gcctgggctt 
tcctggtaca 
tagcttattt 
accagccagc 
tccacctgcc 
tcctgggaag 
ggggacacag 



ctgcctaggc 
ctgccttgcc 
cctgcaagca 
ctgcagctac 
ggctgcacta 
ggtgctgccc 
ggtgcacatc 
gagccagcct 
catcatctgg 
tgtgcagatg 
caaatgctat 
gagccccaag 
tgaatga 



1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2577 



<210> 14 
<211> 858 
<212> PRT 
<213> Rattus sp. 

<400> 14 

Met Pro Gly Leu Ala lie Leu Gly Leu Ser Leu Ala Ala Phe Leu Glu 
1 5 10 15 

Leu Gly Met Gly Ser Ser Leu Cys Leu Ser Gin Gin Phe Lys Ala Gin 
20 25 30 

Gly Asp Tyr lie Leu Gly Gly Leu Phe Pro Leu Gly Thr Thr Glu Glu 
35 40 45 

Ala Thr Leu Asn Gin Arg Thr Gin Pro Asn Gly He Leu Cys Thr Arg 
50 55 60 

Phe Ser Pro Leu Gly Leu Phe Leu Ala Met Ala Met Lys Met Ala Val 
65 70 75 80 

Glu Glu He Asn Asn Gly Ser Ala Leu Leu Pro Gly Leu Arg Leu Gly 
85 90 95 

Tyr Asp Leu Phe Asp Thr Cys Ser Glu Pro Val Val Thr Met Lys Pro 
100 105 110 

Ser Leu Met Phe Met Ala Lys Val Gly Ser Gin Ser He Ala Ala Tyr 
115 120 125 

Cys Asn Tyr Thr Gin Tyr Gin Pro Arg Val Leu Ala Val He Gly Pro 
130 135 140 

His Ser Ser Glu Leu Ala Leu He Thr Gly Lys Phe Phe Ser Phe Phe 
145 150 155 160 



Leu Met Pro Gin Val Ser Tyr Ser Ala Ser Met Asp Arg Leu Ser Asp 
165 170 175 



Arg Glu Thr Phe Pro Ser Phe Phe Arg Thr Val Pro Ser Asp Arg Val 
180 185 190 



oo oo 



12 

Gin Leu Gin Ala Val Val Thr Leu Leu Gin Asn Phe Ser Trp Asn Trp 
195 200 205 

Val Ala Ala Leu Gly Ser Asp Asp Asp Tyr Gly Arg Glu Gly Leu Ser 
. 210 215 220 

lie Phe Ser Gly Leu Ala Asn Ser Arg Gly lie Cys lie Ala His Glu 
225 230 235 240 

Gly Leu Val Pro Gin His Asp Thr Ser Gly Gin Gin Leu Gly Lys Val 
245 250 255 

Val Asp Val Leu Arg Gin Val Asn Gin Ser Lys Val Gin Val Val Val 
260 265 270 

Leu Phe Ala Ser Ala Arg Ala Val Tyr Ser Leu Phe Ser Tyr Ser lie 
275 280 285 

Leu His Asp Leu Ser Pro Lys Val Trp Val Ala Ser Glu Ser Trp Leu 
290 295 300 

Thr Ser Asp Leu Val Met Thr Leu Pro Asn lie Ala Arg Val Gly Thr 
305 310 315 320 

Val Leu Gly Phe Leu Gin Arg Gly Ala Leu Leu Pro Glu Phe Ser His 
325 330 335 

Tyr Val Glu Thr Arg Leu Ala Leu Ala Ala Asp Pro Thr Phe Cys Ala 
340 345 350 

Ser Leu Lys Ala Glu Leu Asp Leu Glu Glu Arg Val Met Gly Pro Arg 
355 360 365 

Cys Ser Gin Cys Asp Tyr lie Met Leu Gin Asn Leu Ser Ser Gly Leu 
370 375 380 

Met Gin Asn Leu Ser Ala Gly Gin Leu His His Gin lie Phe Ala Thr 
385 390 395 400 

Tyr Ala Ala Val Tyr Ser Val Ala Gin Ala Leu His Asn Thr Leu Gin 
405 410 415 

Cys Asn Val Ser His Cys His Thr Ser Glu Pro Val Gin Pro Trp Gin 
420 425 430 

Leu Leu Glu Asn Met Tyr Asn Met Ser Phe Arg Ala Arg Asp Leu Thr 
435 440 445 

Leu Gin Phe Asp Ala Lys Gly Ser Val Asp Met Glu Tyr Asp Leu Lys 
450 455 460 

Met Trp Val Trp Gin Ser Pro Thr Pro Val Leu His Thr Val Gly Thr 
465 470 475 480 



Phe Asn Gly Thr Leu Gin Leu Gin His Ser Lys Met Tyr Trp Pro Gly 
485 490 495 



oo 



Asn Gin Val Pro Val 
500 

Val Arg Arg Val Lys 
515 

Cys Lys Ala Gly Ser 
530 

Pro Cys Gly Lys Asp 
545 

Pro Arg Arg Pro Lys 
565 

Leu Leu Leu Leu Leu 
580 

Gly Leu Phe Val His 
595 

Gly Ser Leu Phe Cys 
610 

Ser Val Leu Leu Phe 
625 

Gin Gin Pro Met Ala 
645 

Phe Leu Gin Ala Ala 
660 

Trp Ala Asn Trp Leu 
675 

Val Val Leu Leu Ala 
690 

Leu Met Ala Phe Pro 
705 

Thr Glu Val Leu Glu 
725 

Leu Val His lie Thr 
740 

Thr Phe Leu Val Gin 
755 

Leu Thr Phe Ala Met 
770 

Pro Leu Leu Ala Asn 
785 



13 

Ser Gin Cys Ser Arg 
505 

Gly Phe His Ser Cys 
520 

Tyr Arg Lys His Pro 
535 

Gin Trp Ser Pro Glu 
550 

Phe Leu Ala Trp Gly 
570 

Cys Leu Val Leu Gly 
585 

Tyr Trp Asp Ser Pro 
600 

Phe Gly Leu lie Cys 
615 

Pro Gly Arg Pro Arg 
630 

His Leu Pro Leu Thr 
650 

Glu lie Phe Val Glu 
665 

Cys Ser Tyr Leu Arg 
680 

Thr Leu Val Glu Ala 
695 

Pro Glu Val Val Thr 
710 

His Cys Arg Met Arg 
730 

Asn Ala Val Leu Ala 
745 

Ser Gin Pro Gly Arg 
760 

Leu Ala Tyr Phe lie 
775 

Val Gin Val Ala Tyr 
790 



Gin Cys Lys Asp Gly Gin 
510 

Cys Tyr Asp Cys Val Asp 
525 

Asp Asp Phe Thr Cys Thr 
540 

Lys Ser Thr Thr Cys Leu 
555 560 

Glu Pro Ala Val Leu Ser 
575 

Leu Thr Leu Ala Ala Leu 
590 

Leu Val Gin Ala Ser Gly 
605 

Leu Gly Leu Phe Cys Leu 
620 

Ser Ala Ser Cys Leu Ala 
635 640 

Gly Cys Leu Ser Thr Leu 
655 

Ser Glu Leu Pro Leu Ser 
670 

Gly Pro Trp Ala Trp Leu 
685 

Ala Leu Cys Ala Trp Tyr 
700 

Asp Trp Gin Val Leu Pro 
715 720 

Ser Trp Val Ser Leu Gly 
735 

Phe Leu Cys Phe Leu Gly 
750 

Tyr Asn Arg Ala Arg Gly 
765 

lie Trp Val Ser Phe Val 
780 

Gin Pro Ala Val Gin Met 
795 800 



oo no 



Gly Ala lie Leu Phe Cys Ala Leu 
805 

Pro Lys Cys Tyr Val Leu Leu Trp 
82 0 

Phe Phe Leu Gly Arg Ser Pro Lys 
835 840 

Ser Ser Glu Ala Thr Arg Gly His 
850 855 



14 

Gly lie Leu Ala Thr Phe His Leu 
810 815 

Leu Pro Glu Leu Asn Thr Gin Glu 
825 830 

Glu Ala Ser Asp Gly Asn Ser Gly 
845 

Ser Glu 



<210> 15 

<211> 8194 

<212> DNA 

<213> Homo sapiens 

<220> 

<2 21> modif ied_base 
<222> (1251) . . (1300) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modified base 
<222> (1951) . . (2000) 

<223> a, c, t, g, other or unknown 



<400> 15 

gagaatctcg 

gcctccgagc 

ccgatctggt 

agccggccgg 

aaacaccggg 

aacatgtcta 

gtaacaaggc 

tggggcaggg 

aaagttctga 

aaatgccaga 

ccgtccagag 

agttcctgag 

gggctccagt 

tatttaagca 

gccagcatgc 

tgggcctttg 

ctcctggcag 

gtgaccctgt 

ctatagggcc 

gaactgtccc 

ctagacactt 

nnnnnnnnnn 

tcactttctc 

cttcaggacc 

gagcttgaga 

tccctttgct 

ttctcagctg 

ccacctcttc 

gcccaacatc 



cgagatcccg 
cgccggcgcc 
cgaggggctc 
agagagaaag 
atattttttt 
tttgcatacc 
gaaagtatat 
gggtgtcgac 
aacctcgcaa 
gctccttttc 
gaagggtcac 
tgggaccgca 
cccacccctt 
actggcctcc 
tgctctgcac 
cctgccatag 
gcctgttccc 
gtgacaggtg 
cctctggctg 
caggccttgt 
cggccagttt 
nnnnnnnnnn 
tctctctctg 
ttttcgatgc 
gcccttgttg 
cccaagcctc 
tctcttactg 
caggctatgc 
accctggggt 



tcggtccgcc 
ctctgccggc 
cacggaggac 
ccagaaacct 
tctcctgcag 
ttcggtttgc 
gacaatttgc 
tcaaagctgt 
cacccggaga 
taagccaggt 
tgggtgccac 
ggcccggaat 
ttgggggcct 
ttagaggcca 
ggctcgcctg 
cacggagtct 
tctccattct 
agtgaggggc 
ccatcctcca 
tcatcaatcc 
ccaattattt 
nnnnnnnnnn 
gaaaacactg 
taataagttt 
aagttgtggt 
agagtctagg 
gctttctcca 
ggcttggggt 
accagctgta 



ccgctgccct 
aacctccgga 
tccatttacg 
cgcgaccagc 
aaaaagcttt 
atgcatttgt 
tcagaatctt 
gtctcattta 
aattgtgttc 
gaagtcacag 
ctggtttgca 
gtcaaggcaa 
gaagttagga 
ctccttggcc 
gtcggcctgc 
tctcctgact 
ggctgtctgc 
cagcagagcc 
aacaggacct 
acttgccacc 
cacccttgct 
nnnnnnnnnn 
actaatgtag 
ctccatcagg 
ttgggggact 
aggccagagg 
caggtcttgt 
tgaggagata 
tgatgtgtgt 



cccagctgcc 
agcacactag 
ttacgcaaat 
catgggccac 
aggattggca 
ttcgaagtga 
aatgtcagaa 
gtaaactgag 
cagcctccca 
agcgtggaca 
tctgtgcctt 
acagtcctgc 
agcatccggc 
atgccaggcg 
agcttctcat 
tcaccctccc 
aggtgaggca 
acacttagtg 
tgcctctgcc 
taagtgctgg 
gttagaatgt 
aattccttaa 
caggtttctc 
gccagcttgt 
ggaccgatga 
gtctcagcag 
agcttcaatg 
aacaactcca 
tctgactctg 



gaaaagaggg 
gaggttccag 
tccctacccc 
ctctccggaa 
gtttaaacaa 
gcaaccctgg 
aactggagac 
gcccaggtaa 
cctcgcccca 
gaacccacaa 
cgtcctgccc 
ttcagccact 
agctgccttc 
cgggcatctg 
ttcctgctgc 
cggagattac 
cagacccgag 
ggacccctgg 
tttgcccctt 
ctagaccttc 
nnnnnnnnnn 
actaaatttc 
tgctccagga 
tcctcctact 
cctcaaaggt 
gcctttgtcc 
agcatggcta 
cggccctgct 
ccaatgtgta 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 



oo 



oo 



15 



tgccacgctg 

tctccactat 

caccacagcc 

tttgcccatc 

nnnnnnnnnn 

acggggtttc 

ctcggcctcc 

taatataata 

tgttttccta 

gacattagat 

gggttcaagc 

taaatacaga 

tcctaacagg 

caaactgcct • 

atgcaggttt 

tcccacccct 

caggctgagg 

gccaggcact 

ttagctatgc 

gcaccatccc 

ggtggacctg 

cactggagaa 

tctctgccca 

gggccaccgt 

tggtgctgac 

ggcacatcac 

agaagagggc 

aggcccctag 

gccaagcttt 

acaacgcata 

cctctggagc 

cacctcctgt 

ctctaaatgc 

gttttttgag 

ctctgcaact 

gggattacag 

agatagagtc 

gagctccgcc 

acgggcgccc 

caccatgtta 

ccaaagtgct 

tagagatggg 

ctcctgcttc 

gatctttctc 

aagatccagg 

ttggtgggga 

gaaaccacca 

tctgtgctgt 

caaggtgcat . 

cagtagctat 

cggttcctcc 

cggaaaggac 

acctagagcc 

gtccagctgc 

gagtgtgcag 

gccctgaggg 

cttgggcccc 

gcgactgtct 



agagtgctct 
tcccctacgg 
gccctgctga 
tcccttcagg 
nnnnnnnnnn 
accgtgttag 
caatgtgctg 
aaataattat 
caactagatg 
tctcataagt 
tcctacaaga 
tgaagcttcg 
ccactgacct 
ccagtggaag 
tgtctccttt 
cccccagaac 
ggtgctctcc 

gggggggCCt 

ggccagcagc 
caatgacaag 
gatctctctg 
ccaggccact 
ggtgggcgat 
cgtggttgtt 
caacctgact 
tggggtgccc 
tgtccctggc 
gccttgccac 
catggcacac 
ccgggctgtg 
ttgttccagg 
cagggagaac 
caagggggat 
acagtctggc 
tccacctcct 
gcacccacca 
tcgctctgtt 
tcccaggttc 
gccaccacgc 
gccaggatgg 
gggattacag 
gtttcaccat 
ggcctcccaa 
tctgatcctt 
gctaaaactg 
agattgaggg 
ggacggaaac 
ctgtggtggc 
ttccttctac 
aacataattg 
acatggtctc 
aaccaggtaa 
tgggggtgat 
caccactcta 
atgccctggg 
cagatgcaca 
tacgtgtggc 
tgaagggcac 



ccctgccagg 
tgctggcagt 
gccctttcct 
caagtctggg 
gccaccatgc 
ccaggctggt 
ggattacagg 
acaactcacc 
gtcccatctg 
agcgtgcaac 
atctgatgct 
cttactcacc 
aacttctgcc 
tccctgaagg 
gcttggaatg 
ctgccccagt 
tggtctcccc 
tcagtggaga 
gagacgctca 
taccaggtgg 
gttggcagca 
ggtcagggga 
gagaggatgc 
ttttccagcc. 
ggcaaggtgt 
gggatccagc 
ctgaaggcgt 
aagggctcct 
acgatgccca 
tatgcggtgg 
ggccgagtct 
agccaatcct 
aaatgccact 
tctgtcaccc 
gggttcaagt 
ccatgcctgg 
gcccaggctg 
actccattcc 
ccagctaatt 
tctcaatctc 
gcgtgagcca 
gttggccagg 
agtgctggga 
gccttctctc 
tctgtaaagg 
gcttcctaag 
ccaggaaggc 
ttcatgatac 
acaaggacac 
cctgggactg 
cagttcagct 
tggggatgtg 
gctgacacag 
cccatcctgg 
gcggaagttc 
gagattctgt 
ccctctggct 
cagcgagtgg 



gcaacaccac 
gattgggcct 
ggtgcccatg 
nnnnnnnnnn 
ccggctaatt 
cgcaaactcc 
tgtgagccac 
ataatgtaga 
ggggtgatgg 
ccagatccct 
gctgctgatc 
agctgctcac 
ctgacctaca 
tccccaaaca 
catcccctca 
ggagccttcg 
ggctccctgt 
ctgaaatggc 
gcgtgaagcg 
agaccatggt 
gtgacgacta 
tctgcattgc 
agtgcctcat 
ggcagttggc 
gggtcgcctc 
gcattgggat 
ttgaagaagc 
ggtgcagcag 
agctcaaagc 
cccatggcct 
acccctggca 
gagatgagca 
aacttgaggt 
aggctgcagt 
gattctcttg 
ataatttttc 
gaatgcagtg 
cctgcctcag 
ttttttgtat 
ctgaccttgt 
ccgcacccgg 
ctggtctcga 
ttacaggcat 
acccactgtg 
agtgtttgtt 
aaggaaggga 
cccaggccct 
gcgtttcttt 
tgtggcgttt 
gaatggaccc 
aaacataaat 
gctactcacc 
tgtacaggga 
ccagggaagc 
acacgaccag 
tttctgttcc 
tcttacaggt 
ttacgggttt 



atagagctcc 
gacagcacca 
gtaagctgga 
nnnnnnnnnn 
tttttgtatt 
taacctcgtg 
tgcacccggc 
atcagtggga 
gagacagtga 
cgcatgtgca 
tgacaggagg 
ctcctcctgt 
catgcttctc 
cacgggacta 
ccccttgtcc 
caggtgattt 
atccccacac 
tgaacgggac 
gcagtatccc 
gctgctgctg 
tgggcagcta 
tttcaaggac 
gcgccacctg 
cagggtgttt 
agaagcctgg 
ggtgctgggc 
ctatgcccgg 
caatcagctc 
cttctccatg 
ccaccagctc 
ggtaagagag 
gagtgggcac 
tttttgtttt 
gtagtgatgc 
cctcggcctc 
ttttcttttt 
gtgcgatctt 
cctcccaagt 
tttgagtaga 
catccgccca 
cctaattttt 
actcctggca 
tagctctctt 
tcttggaagt 
agaggcctcc 
cgagaccttc 
tgcttctggg 
cagcttttgg 
aatgacaaca 
aagtggacct 
gagaccaaaa 
atgtaactgg 
gcaggagggg 
agggaagaca 
gggccctgcc 
acatgtgagc 
gcctaagtct 
ccatcactgc 



aaggagacct 
accgtgctgc 
gcctcagacc 
nnnnnnnnnn 
tttagtagag 
atccacccac 
cataatgtat 
gccctgagct 
cagatcatca 
gttcacagta 
ggagcagctg 
gaggcccggt 
ttcttccttg 
tttcactcct 
ccaggcagat 
gtcagtttca 
ccagcacagg 
ctcccataga 
tctttcctgc 
cagaagttcg 
ggggtgcagg 
atcatgccct 
gcccaggccg 
ttcgagtccg 
gccctctcca 
gtggccatcc 
gcagacaaga 
tgcagagaat 
agttctgcct 
ctgggctgtg 
cccaccccag 
tctccggtca 
gttttgtttt 
gatctcggct 
ctgagtagct 
tttttttttg 
ggctcactgt 
aggtgggact 
gacggggttt 
cctcgtcctc 
gtatttttag 
tcaagtgatc 
ctcttagaca 
gtcaagtgat 
tctcaggagg 
ctgatgggct 
accatgtggg 
agcagatcca 
gagatcccct 
tcacggtcct 
tccagtggca 
cttatgggca 
ggccccaggg 
ctccgtaggc 
ctgggagtga 
tgtcctttga 
gtgtgttcca 
tgctttgagt 



1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4320 
4380 
4440 
4500 
4560 
4620 
4680 
4740 
4800 
4860 
4920 
4980 
5040 
5100 
5160 
5220 



oo 
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gtgtgccctg tggggctggg accttcctca 
cgagctaccc agcactcccg ggggctgcac 
gtgccctgcc ccagaaccaa ggcccagtca 
acacctgcta ccagacagaa ttctgatcaa 
gcctgtaatc ccagcacttt gggaggctga 
gagaccagcc tggccaacat ggtgaaaccc 
gggtgtggtg gcgcgtgcct gtaatcccag 
ttgaacccag gaggcggagg ttgcagtgag 
cgagaattcg tccccccaaa aaaagaaagg 
cccagcactt tgggaggccg aggtgggtgg 
ctgaccaaca tggtgaaacc ccatctctac 
gtggcgtgtg cctgtaattc cagctactcg 
cgggaggcgg aggttgcagt gagccaagat 
gagaaaaact ctgtctcaaa aaaaaagaaa 
agactgaggt gtgtcctctg ttagagagct 
tcctgaattc aacctctttc tctaaatgaa 
tcctactgtc ccttctgttg cccatgccaa 
gaatacagat actagcgtgt ctgcagcaga 
caaggtcaag aacagagagc aaattaggta 
aggggccaca ttctttcctt tcaccatctc 
tcagagggtc aggactcaga gaaaccacag 
atgctggcaa gagagagggg ttacaatgcc 
tcgtaacctc tctggtatgt gggcagagct 
aaaccctcat gggatcatga gccatacaga 
taacacaggc attttgagga aatgcgtggc 
cactatgcct agtatagtct agctgccctg 
tatttcctat tcctactctg ctcatctggc 
gacctctaca gatgccagcc ttgtgggaaa 
tgcttcccgc gcactgtggt gtttttggct 
gcagctaaca cgctgctgct gctgctgctg 
ctagacaccc ctgtggtgag gtcagcaggg 
ctggcagcag gtagtggcag cctctatggc 
ttgctacgcc aggccctctt tgcccttggt 
cgctcattcc aactaatcat catcttcaag 
gcctgggtcc aaaaccacgg tgctggcctg 
cttatctgtc taacttggct ggtggtgtgg 
ttcccccatc tggtgatgct tgagtgcaca 
ttcctctaca atggcctcct ctccatcagt 
ttgccagaga actacaacga ggccaaatgt 
tcctggatcg ccttcttcac cacggccagc 
aacatgatgg ctgggctgag cagcctgagc 
tgctacgtga tcctctgccg cccagacctc 
caggactaca cgaggcgctg cggctccacc 
gccttctctg ccctgagggt cgaaggtcga 
gcatcgcggt ctggggttgg gacgtgtaag 
ctgccaataa agaagtgaaa tgcgtatctg 
acggattcaa gtctgaaccc agagcctgga 
ggcaactccg gaggcgggcc cagcgccaaa 
cattggccgt tctctgcggg gccccgccct 
cgaggcgcac ctcctggcct gcacgctttg 



acaagagtgg tgagtgggca atggagcagg 5280 
99 t 99 a 999 a gggcctccct tgggccccat 5340 
ctgggctgcc agttagcttc aggttggagg 5400 
gagaatcagc cactgggtgc ggtggctcat 5460 
ggcgggtgga tcacttgagg tcgggagttc 5520 
catctctacc aaaaatataa aaaattagct 5580 
ctactcggga ggctgaggca ggagaatcac 564 0 
ccaagatgca ttccagcctg gaccacaaag 5700 
aggccgggcg cggtggctca cacctgtaat 5760 
atcacctgag gtcaggagtt cgagaccagc 5820 
taaaaataca aaaaaagtta gccgggcgtt 5880 
ggaggctgag gcaggagaat tgcttgaacc 594 0 
tgcaccattg cactccagcc tgggcgacaa 6000 
gaaagaaaga attagccaac tgaaagcctt 6060 
gtcatcacaa ctcctacaaa agcagtcgta 6120 
tatagctatt gttccctttg tgccctcttg 6180 
agacagctag ctccttgaac agcttggcct 6240 
gaaaaaaaca gcattcccca tccagaaatg 6300 
gctaaggact caggtcctta gttggtgtcc 6360 
tgtagggaca ggaatacttc ccttctgtcc' 6420 
agcagcagct caggaaagtg gttcatggaa 6480 
ctcccttggg agcaggctgc tcccatcaga 6540 
accaggttaa ggtcctccct agggtttgca 6600 
accgacctgt gtgtctccag agtctgtaat 6660 
ctcaggcccc actcccggct acccccatcc 6720 
gtacaattct cccagtatct tgcaggcccc 6780 
tctcaggaac cttcttggcc ttccctttca 6840 
gaagagtggg cacctgaggg aagccagacc 6900 
ttgcgtgagc acacctcttg ggtgctgctg 6960 
cttgggactg ctggcctgtt tgcctggcac 702 0 
ggccgcctgt gctttcttat gctgggctcc 7080 
ttctttgggg aacccacaag gcctgcgtgc 7140 
ttcaccatct tcctgtcctg cctgacagtt 7200 
ttttccacca aggtacctac attctaccac 7260 
tttgtgatga tcagctcagc ggcccagctg 7320 
accccactgc ctgctaggga ataccagcgc 7380 
gagaccaact ccctgggctt catactggcc 7440 
gcctttgcct gcagctacct gggtaaggac 7500 
gtcaccttca gcctgctctt caacttcgtg 7560 
gtctacgacg gcaagtacct gcctgcggcc 762 0 
agcggcttcg gtgggtattt tctgcctaag 7680 
aacagcacag agcacttcca ggcctccatt 7740 
tgaccagtgg gtcagcaggc acggctggca 7800 
gcaggccggg ggtgtccggg aggtctttgg 7860 
cgcctgggag agcctagacc aggctccggg 7920 
gtctcctgtc gtgggagagt 'gtgaggtgta 7980 
aaaggctgac cgcccagatt gacgttgcta 8040 
agaacagggc gaggcgtcgt ccccgcatcc 8100 
cgggggccgg agctagaagc tctacgcttc 8160 
acgt 8194 



<210> 16 

<211> 2526 

<212> DNA 

<213> Homo sapiens 



on 



oo 
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<400> 16 

atgctgctct 

tttgcctgcc 

gcaggcctgt 

ctgtgtgaca 

cttggggttg 

cagctgtatg 

ctgccagggc 

ctggcagtga 

cctttcctgg 

cagtatccct 

ctgctgctgc 

gggcagctag 

ttcaaggaca 

cgccacctgg 

agggtgtttt 

gaagcctggg 

gtgctgggcg 

tatgcccggg 

aatcagctct 

ttctccatga 

caccagctcc 

cttttggagc 

gacaacagag 

tggaccttca 

accaaaatcc 

tgtcttgaag 

ccctgtgggg 

aaagaagagt 

gctttgcgtg 

ctgcttggga 

99999ccgcc 

ggcttctttg 

ggtttcacca 

aagttttcca 

ctgtttgtga 

tggaccccac 

acagagacca 

agtgcctttg 

tgtgtcacct 

agcgtctacg 

agcagcggct 

ctcaacagca 

acctga 



gcacggctcg 
atagcacgga 
tccctctcca 
ggtcttgtag 
aggagataaa 
atgtgtgttc 
aacaccacat 
ttgggcctga 
tgcccatgat 
ctttcctgcg 
agaagttcgg 
gggtgcaggc 
tcatgccctt 
cccaggccgg 
tcgagtccgt 
ccctctccag 
tggccatcca 
cagacaagaa 
gcagagaatg 
gttctgccta 
tgggctgtgc 
agatccacaa 
atcccctcag 
cggtcctcgg 
agtggcacgg 
ggcaccagcg 
ctgggacctt 
gggcacctga 
agcacacctc 
ctgctggcct 
tgtgctttct 
gggaacccac 
tcttcctgtc 
ccaaggtacc 
tgatcagctc 
tgcctgctag 
actccctggg 
cctgcagcta 
tcagcctgct 
acggcaagta 
tcggtgggta 
cagagcactt 



cctggtcggc 
gtcttctcct 
ttctggctgt 
cttcaatgag 
caactccacg 
tgactctgcc 
agagctccaa 
cagcaccaac 
tagctatgcg 
caccatcccc 
gtggacctgg 
actggagaac 
ctctgcccag 
ggccaccgtc 
ggtgctgacc 
gcacatcact 
gaagagggct 
ggcccctagg 
ccaagctttc 
caacgcatac 
ctctggagct 
ggtgcatttc 
tagctataac 
ttcctccaca 
aaaggacaac 
agtggttacg 
cctcaacaag 
gggaagccag 
ttgggtgctg 
gtttgcctgg 
tatgctgggc 
aaggcctgcg 
ctgcctgaca 
tacattctac 
agcggcccag 
ggaataccag 
cttcatactg 
cctgggtaag 
cttcaacttc 
cctgcctgcg 
ttttctgcct 
ccaggcctcc 



ctgcagcttc 
gacttcaccc 
ctgcaggtga 
catggctacc 
gccctgctgc 
aatgtgtatg 
ggagaccttc 
cgtgctgcca 
gccagcagcg 
aatgacaagt 
atctctctgg 
caggccactg 
gtgggcgatg 
gtggttgttt 
aacctgactg 
ggggtgcccg 
gtccctggcc 
ccttgccaca 
atggcacaca 
cgggctgtgt 
tgttccaggg 
cttctacaca 
ataattgcct 
tggtctccag 
caggtgccta 
ggtttccatc 
agtgacctct 
acctgcttcc 
ctggcagcta 
cacctagaca 
tccctggcag 
tgcttgctac 
gttcgctcat 
cacgcctggg 
ctgcttatct 
cgcttccccc 
gccttcctct 
gacttgccag 
gtgtcctgga 
gccaacatga 
aagtgctacg 
attcaggact 



tcatttcctg 
tccccggaga 
ggcacagacc 
acctcttcca 
ccaacatcac 
ccacgctgag 
tccactattc 
ccacagccgc 
agacgctcag 
accaggtgga 
ttggcagcag 
gtcaggggat 
agaggatgca 
tttccagccg 
gcaaggtgtg 
ggatccagcg 
tgaaggcgtt 
agggctcctg 
cgatgcccaa 
atgcggtggc 
gccgagtcta 
aggacactgt 
gggactggaa 
ttcagctaaa 
agtctgtgtg 
actgctgctt 
acagatgcca 
cgcgcactgt 
acacgctgct 
cccctgtggt 
caggtagtgg 
gccaggccct 
tccaactaat 
tccaaaacca 
gtctaacttg 
atctggtgat 
acaatggcct 
agaactacaa 
tcgccttctt 
tggctgggct 
tgatcctctg 
acacgaggcg 



ctgctgggcc 
ttacctcctg 
cgaggtgacc 
ggctatgcgg 
cctggggtac 
agtgctctcc 
ccctacggtg 
cctgctgagc 
cgtgaagcgg 
gaccatggtg 
tgacgactat 
ctgcattgct 
gtgcctcatg 
gcagttggcc 
ggtcgcctca 
cattgggatg 
tgaagaagcc 
gtgcagcagc 
gctcaaagcc 
ccatggcctc 
cccctggcag 
ggcgtttaat 
tggacccaag 
cataaatgag 
ttccagcgac 
tgagtgtgtg 
gccttgtggg 
ggtgtttttg 
gctgctgctg 
gaggtcagca 
cagcctctat 
ctttgccctt 
catcatcttc 
cggtgctggc 
gctggtggtg 
gcttgagtgc 
cctctccatc 
cgaggccaaa 
caccacggcc 
gagcagcctg 
ccgcccagac 
ctgcggctcc 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

144 0 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2526 



<210> 17 

<211> 841 

<212> PRT 

<213> Homo sapiens 

<400> 17 

Met Leu Leu Cys Thr Ala Arg Leu Val Gly Leu Gin Leu Leu lie Ser 
1 5 10 15 

Cys Cys Trp Ala Phe Ala Cys His Ser Thr Glu Ser Ser Pro Asp Phe 
20 25 30 



no no 
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Thr Leu Pro Gly Asp Tyr Leu Leu Ala Gly Leu Phe Pro Leu His Ser 
35 40 45 

Gly Cys Leu Gin Val Arg His Arg Pro Glu Val Thr Leu Cys Asp Arg 
50 55 60 

Ser Cys Ser Phe Asn Glu His Gly Tyr His Leu Phe Gin Ala Met Arg 
65 70 75 80 

Leu Gly Val Glu Glu He Asn Asn Ser Thr Ala Leu Leu Pro Asn He 
85 90 95 

Thr Leu Gly Tyr Gin Leu Tyr Asp Val Cys Ser Asp Ser Ala Asn Val 
100 105 110 

Tyr Ala Thr Leu Arg Val Leu Ser Leu Pro Gly Gin His His He Glu 
115 120 125 

Leu Gin Gly Asp Leu Leu His Tyr Ser Pro Thr Val Leu Ala Val He 
130 135 140 

Gly Pro Asp Ser Thr Asn Arg Ala Ala Thr Thr Ala Ala Leu Leu Ser 
145 150 155 160 

Pro Phe Leu Val Pro Met He Ser Tyr Ala Ala Ser Ser Glu Thr Leu 
165 170 175 

Ser Val Lys Arg Gin Tyr Pro Ser Phe Leu Arg Thr He Pro Asn Asp 
180 185 190 

Lys Tyr Gin Val Glu Thr Met Val Leu Leu Leu Gin Lys Phe Gly Trp 
195 200 205 

Thr Trp He Ser Leu Val Gly Ser Ser Asp Asp Tyr Gly Gin Leu Gly 
210 215 220 

Val Gin Ala Leu Glu Asn Gin Ala Thr Gly Gin Gly He Cys He Ala 
225 230 235 240 

Phe Lys Asp He Met Pro Phe Ser Ala Gin Val Gly Asp Glu Arg Met 
245 250 255 

Gin Cys Leu Met Arg His Leii Ala Gin Ala Gly Ala Thr Val Val Val 
260 265 270 

Val Phe Ser Ser Arg Gin Leu Ala Arg Val Phe Phe Glu Ser Val Val 
275 280 285 

Leu Thr Asn Leu Thr Gly Lys Val Trp Val Ala Ser Glu Ala Trp Ala 
290 295 300 

Leu Ser Arg His He Thr Gly Val Pro Gly He Gin Arg He Gly Met 
305 310 315 320 



Val Leu Gly Val Ala He Gin Lys Arg Ala Val Pro Gly Leu Lys Ala 
325 330 335 



GO OO 
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Phe Glu Glu Ala Tyr Ala Arg Ala Asp Lys Lys Ala Pro Arg Pro Cys 
340 345 350 

His Lys Gly Ser Trp Cys Ser Ser Asn Gin Leu Cys Arg Glu Cys Gin 
355 360 365 

Ala Phe Met Ala His Thr Met Pro Lys Leu Lys Ala Phe Ser Met Ser 
370 375 380 

Ser Ala Tyr Asn Ala Tyr Arg Ala Val Tyr Ala Val Ala His Gly Leu 
385 390 395 400 

His Gin Leu Leu Gly Cys Ala Ser Gly Ala Cys Ser Arg Gly Arg Val 
405 410 415 

Tyr Pro Trp Gin Leu Leu Glu Gin lie His Lys Val His Phe Leu Leu 
420 425 430 

His Lys Asp Thr Val Ala Phe Asn Asp Asn Arg Asp Pro Leu Ser Ser 
435 440 445 

Tyr Asn lie lie Ala Trp Asp Trp Asn Gly Pro Lys Trp Thr Phe Thr 
450 455 460 

Val Leu Gly Ser Ser Thr Trp Ser Pro Val Gin Leu Asn lie Asn Glu 
465 470 475 480 

Thr Lys lie Gin Trp His Gly Lys. Asp Asn Gin Val Pro Lys Ser Val 
485 490 495 

Cys Ser Ser Asp Cys Leu Glu Gly His Gin Arg Val Val Thr Gly Phe 
500 505 510 

His His Cys Cys Phe Glu Cys Val Pro Cys Gly Ala Gly Thr Phe Leu 
515 520 525 

Asn Lys Ser Asp Leu Tyr Arg Cys Gin Pro Cys Gly Lys Glu Glu Trp 
530 535 540 

Ala Pro Glu Gly Ser Gin Thr Cys Phe Pro Arg Thr Val Val Phe Leu 
545 550 555 560 

Ala Leu Arg Glu His Thr Ser Trp Val Leu Leu Ala Ala Asn Thr Leu 
565 570 575 

Leu Leu Leu Leu Leu Leu Gly Thr Ala Gly Leu Phe Ala Trp His Leu 
580 585 590 

Asp Thr Pro Val Val Arg Ser Ala Gly Gly Arg Leu Cys Phe Leu Met 
595 600 605 

Leu Gly Ser Leu Ala Ala Gly Ser Gly Ser Leu Tyr Gly Phe Phe Gly 
610 t 615 620 

Glu Pro Thr Arg Pro Ala. Cys Leu Leu Arg Gin Ala Leu Phe Ala Leu 
625 630 635 640 



no no 



20 

Gly Phe Thr lie Phe Leu Ser Cys Leu Thr Val Arg Ser Phe Gin Leu 
645 650 655 

lie lie lie Phe Lys Phe Ser Thr Lys Val Pro Thr Phe Tyr His Ala 
660 665 670 



Trp Val Gin Asn 
675 

Ala Gin Leu Leu 
690 

Pro Ala Arg Glu 
705 

Thr Glu Thr Asn 



Leu Leu Ser lie 
740 

Pro Glu Asn Tyr 
755 

Asn Phe Val Ser 
770 



His Gly Ala Gly 
680 

lie Cys Leu Thr 
695 

Tyr Gin Arg Phe 
710 

Ser Leu Gly Phe 
725 

Ser Ala Phe Ala 



Asn Glu Ala Lys 
760 

Trp lie Ala Phe 
775 



Leu Phe Val Met 



Trp Leu Val Val 
700 

Pro His Leu Val 
715 

lie Leu Ala Phe 
730 

Cys Ser Tyr Leu 
745 

Cys Val Thr Phe 



Phe Thr Thr Ala 
780 



lie Ser Ser Ala 
685 

Trp Thr Pro Leu 



Met Leu Glu Cys 
720 

Leu Tyr Asn Gly 
735 

Gly Lys Asp Leu 
750 

Ser Leu Leu Phe 
765 

Ser Val Tyr Asp 



Gly Lys. Tyr Leu Pro Ala Ala Asn 
785 790 

Ser Ser Gly Phe Gly Gly Tyr Phe 
805 

Cys Arg Pro Asp Leu Asn Ser Thr 
820 

Asp Tyr Thr Arg Arg Cys Gly Ser 
835 840 



Met Met Ala Gly Leu Ser Ser Leu 
795 800 

Leu Pro Lys Cys Tyr Val lie Leu 
810 815 

Glu His Phe Gin Ala Ser lie Gin 
825 " 830 

Thr 



<210> 18 
<211> 14 
<212> PRT 

<213> Artificial Sequence 
<220> 

<221> M0D_RES 

<222> (1) 

<223> Thr or Arg 

<220> 

<221> M0D_RES 

<222> (3) 

<22 3> Phe or Leu 

<220> 

<221> MOD RES 



oo 



OO 
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<222> (4) 

<223>. Arg, Gin or Pro 
<220> 

<221> MOD_RES 

<222> (6) 

<223> Arg or Thr 

<220> 

<221> MOD_RES 
<222> (7) 

<223> Ser, Pro or Val 
<220> 

<221> MOD__RES 
<222> (8) 

<223> Val, Glu, Arg, Lys or Thr 
<220> 

<221> MOD_RES 

<222> (11) 

<223> Ala or Glu 

<220> 

<221> MOD_RES 

<222> (12) 

<223> Trp or Leu 

<220> 

<221> MOD_RES 
<222> (13) 

<223> Arg, His or Gly 
<220> 

<223> Description of Artificial Sequence: Consensus 
sequence 

<400> 18 

Xaa Cys Xaa Xaa Arg Xaa Xaa Xaa Phe Leu Xaa Xaa Xaa Glu 
1 5 10 



<210> 19 
<211> 15 
<212> PRT 

<213> Artificial Sequence 
<220> 

<221> M0D_RES 

<222> (1) 

<223> Leu or Gin 

<220> 

<221> MOD_RES 
<222> (3) 

<223> Glu, Gly or Thr 



no 



no 



<220> 

<221> MOD_RES 
<222> (4) 

<223> Asn, Arg or Cys 



MOD_RES 
(7) 

Arg or Glu 



MOD_RES 
(9) 

Arg or Lys 



<220> 
<221> 
<222> 
<223> 

<220> 
<221> 
<222> 
<223> 

<220> 
<221> 
<222> 
<223> 



MOD_RES 
(10) 

Cys , Gly 



or Phe 



<220> 

<221> MOD_RES 
<222> (11) 

<223> Val, Leu or lie 
<220> 

<221> MOD_RES 

<222> (13) 

<223> Phe or Leu 

<220> 

<221> MOD__RES 

<222> (14) 

<223> Ala or Asn 

<220> 

<221> MOD_RES 

<222> (15) 

<223> Met or Leu 



<220> 

<223> Description of Artificial Sequence: Consensus 
sequence 

<400> 19 

Xaa Pro Xaa Xaa Tyr Asn Xaa Ala Xaa Xaa Xaa Thr Xaa Xaa Xaa 
1 5 10 15 



<210> 20 

<211> 3563 

<212> DNA 

<213> Homo sapiens 



<400> 20 

agcctggcag tggcctcagg cagagtctga 
ggacaccact ggggccccag ggtgtggcaa 
tcctctgccc gctccccgcc ccgggctcac 



cgcgcacaaa ctttcaggcc caggaagcga 60 
gtgaggatgg caagggtttt gctaaacaaa 120 
tccatgtgag gccccagtcg gggcagccac 180 



oo 



oo 
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ctgccgtgcc 
ctctgggctc 
atgaaggggg 
ctccgcagcc 
tgggtcgggg 
ctgcggttct 
aaatggccgt 
acgacctctt 
tggccaaggc 
gtgtgctggc 
tcagcttctt 
cctgccccgt 
cctgggagcc 
ggagctgctg 
tgtgcagctg 
cctgggcagc 
ggcacgcggc 
gcggctgggg 
gctgctgttc 
gctctcgccc 
gctgcccggc 
gcacgagttc 
ctctgccctg 
gcagtgtgac 
ctctgtctac 
cgcctcaggc 
gggtgtgctg 
aggtggctgg 
gaccttccac 
gtacgacctg 
gttcaacggc 
ggtgaggtga 
ctgggggtgg 
caggcctgtg 
cgccgggtca 
taccggcaaa 
agggtcctgc 
gcgcccttct 
tccccggagc 
ccggctgtgc 
ttggggctgt 
gcctgctttg 
cagcccagcc 
tgcctgagca 
agctgggcag 
ctggccatgc 
gtggtgacgg 
tgggtcagct 
ggcactttcc 
gccatgctgg 
gtggtcctca 
gctgccttcc 
gagttcttcc 
aatcagggga 
gctgcgatcc 
aggttctgac 
acgtggacac 



tgttggaagt 
tcctgcaccc 
actacgtgct 
ggacacggcc 
tcagggtgac 
gtgtggcccc 
ggaggagatc 
tgatacgtgc 
aggcagccgc 
tgtcatcggg 
cctcatgccc 
gggagcccct 
ctgtgtcaga 
agcgcccggg 
acggccgccg 
gacgacgagt 
atctgcatcg 
aaggtgcagg 
gcctccgtgc 
aaggtgtggg 
atggcccaga 
ccccagtacg 
ggcgagaggg 
tgcatcacgc 
gcagctgtgt 
tgccccgcgc 
tcctctgcat 
cggctcagcc 
gtgggcgggc 
aagctgtggg 
agcctcagga 
gggtgggtgt 

gggccgttcc 
cgcagaagcc 
aggggttcca 
acccaggtga 
caagtcctga 
cctctctcac 
gaagcacacg 
tgctgctgct 
tcgttcacca 
gcctggtgtg 
ctgcccgatg 
cactcttcct 
accggctgag 
tggtggaggt 
actggcacat 
tcggcctagc 
tggtgcggag 
cctacttcat 
ggcccgccgt 
acctgcccag 
tgggaggggg 
aacatgagtg 
cccccaagcc 
cccaggttgt 
ccctgtgacc 



tgcctctgcc 
tgggacgggg 

gggggggctg 

cagcagccct 
caggtctggg 
aggttctcct 
aacaacaagt 
tcggagcctg 
gacatcgccg 
ccccactcgt 
cagtggggcg 
tgtgtcagga 
agatgctctt 
agaccttccc 
cggagctgct 
acggccggca 
cgcacgaggg 
acgtcctgca 
acgccgccca 
tggccagcga 
tgggcacggt 
tgaagacgca 
agcagggtct 
tgcagaacgt 
atagcgtggc 
aggaccccgt 
gtgcccaggc 
ccgtcccccg 
tgccgctgcg 
tgtggcaggg 
cagagcgcct 
gccaggcgtg 
agtctcccgt 
cgtgtcccgg 
ctcctgctgc 
gccgccttcc 
ctctgagacc 
agacgacatc 
ctgcttccgc 
cctgctgctg 
tcgggacagc 
cctgggcctg 
cctggcccag 
gcaggcggcc 
tggctgcctg 
cgcactgtgc 
gctgcccacg 
gcacgccacc 
ccagccgggc 
cacctgggtc 
gcagatgggc 
gtgttacctg 
ccctggggat 
acccaaccct 
agcaatgacc 
ctcctgaccc 
ate 



atgctgggcc 
gccccattgt 
ttccccctgg 
gtgtgcacca 
gtgctcctga 
caaacggcct 
eggatctget 
tggtggccat 
cctactgcaa 
cagagctcgc 
ccccccacca 
gaatgetaca 
ggccttgcag 
ctccttcttc 
gcaggagttc 
gggectgage 
cctggtgccg 
ccaggtgaac 
cgccctcttc 
ggcctggctg 
gcttggcttc 
cctggccctg 
ggaggaggac 
gagegcaggg 
ccaggccctg 
gaagccctgg 
caccaggcac 
cccgcagctc 
gttcgacagc 
ctcagtgccc 
gaagatcege 
cccgtggtag 
gggcatgccc 
tgctcgcggc 
tacgactgtg 
eggcaggegg 
agagcccaca 
gcctgcacct 
cgcaggtctc 
agcctggcgc 
ccactggttc 
gtctgcctca 
cagcccttgt 
gagatcttcg 
cgggggccct 
acctggtacc 
gaggegctgg 
aatgccacgc 
tgctacaacc 
tcctttgtgc 
gccctcctgc 
ctcatgcggc 
gcccaaggcc 
gtgatctcag 
cgtgtctcgc 
tgaccccaca 



ctgctgtcct 
gcctgtcaca 
gegaggcega 
ggtacagagg 
gctggggccg 
gctctgggca 
gcccgggctg 
gaagcccagc 
ctacacgcag 
catggtcacc 
tcacccaccc 
tgcaccccac 
gtcagctacg 
cgcaccgtgc 
ggctggaact 
atettctegg 
ctgccccgtg 
cagagcagcg 
aactacagca 
acctctgacc 
ctccagaggg 
gccaccgacc 
gtggtgggcc 
ctaaatcacc 
cacaacactc 
caggtgagee 
ggccaccacg 
ctggagaaca 
ageggaaacg 
aggctccacg 
tggcacacgt 
cccccgcggc 
agecgagcag 
agtgccagga 
tggactgega 
gggtgggaac 
gggtacaaga 
tttgtggcca 
ggttcctggc 
tgggccttgt 
aggecteggg 
gcgtcctcct 
cccacctccc 
tggagtcaga 
gggcctggct 
tggtggcctt 
tgcactgccg 
tggectttet 
gtgcccgtgg 
ccctcctggc 
tctgtgtcct 
agecaggget 
agaatgaegg 
ccccggtgaa 
tacagagacc 
gtgageccta 



gggcctcagc 
gcaacttagg 
ggaggctggc 
tgggaeggee 
aggtggccat 
ctggccatga 
cgcctgggct 
ctcatgttcc 
taccagcccc 
ggcaagttct 
ccaaccaacc 
ccagccctgc 
gtgetagcat 
ccagcgaccg 
gggtggccgc 
ccctggccgc 
ccgatgactc 
tgcaggtggt 
tcagcagcag 
tggtcatggg 
gtgcccagct 
cggccttctg 
agcgctgccc 
accagaegtt 
ttcagtgcaa 
egggagatgg 
cctgagctgg 
tgtacaacct 
tggacatgga 
acgtgggcag 
ctgacaacca 
agggegcage 
agccagaccc 
gggccaggtg 
ggegggcage 
gcagcagggg 
cgaacaccca 
ggatgagtgg 
atggggcgag 
getggctget 
ggggcccctg 
gttccctggc 
gctcacgggc 
actgcctctg 
ggtggtgctg 
cccgccggag 
cacacgctcc 
ctgcttcctg 
cctcaccttt 
caatgtgcag 
gggcatcctg 
caacaccccc 
gaacacagga 
cccagactta 
ctcccgctct 
ggcctggagc 



240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2580 

2640 

2700 

2760 

2820 

2880 

2940 

3000 

3060 

3120 

3180 

3240 

3300 

3360 

3420 

3480 

3540 

3563 



